\relax 
\providecommand\hyper@newdestlabel[2]{}
\providecommand\HyperFirstAtBeginDocument{\AtBeginDocument}
\HyperFirstAtBeginDocument{\ifx\hyper@anchor\@undefined
\global\let\oldcontentsline\contentsline
\gdef\contentsline#1#2#3#4{\oldcontentsline{#1}{#2}{#3}}
\global\let\oldnewlabel\newlabel
\gdef\newlabel#1#2{\newlabelxx{#1}#2}
\gdef\newlabelxx#1#2#3#4#5#6{\oldnewlabel{#1}{{#2}{#3}}}
\AtEndDocument{\ifx\hyper@anchor\@undefined
\let\contentsline\oldcontentsline
\let\newlabel\oldnewlabel
\fi}
\fi}
\global\let\hyper@last\relax 
\gdef\HyperFirstAtBeginDocument#1{#1}
\providecommand\HyField@AuxAddToFields[1]{}
\providecommand\HyField@AuxAddToCoFields[2]{}
\@writefile{toc}{\contentsline {chapter}{Summary}{vi}{dummy.2}}
\@writefile{toc}{\contentsline {chapter}{Samenvatting}{vii}{dummy.3}}
\@writefile{toc}{\contentsline {chapter}{Acknowledgements}{viii}{dummy.4}}
\@writefile{toc}{\vspace  {1em}}
\@writefile{toc}{\contentsline {chapter}{List of Figures}{xiii}{dummy.6}}
\@writefile{toc}{\contentsline {chapter}{List of Tables}{xv}{dummy.8}}
\citation{dorneles_approximate_2011,elmagarmid_duplicate_2007,spaccapietra_survey_2005}
\citation{citeulike:1176986}
\citation{bizer_linked_2009}
\citation{elmagarmid_duplicate_2007,DBLP:books/daglib/0030287,DBLP:journals/dke/KopckeR10,dorneles_approximate_2011}
\citation{DBLP:journals/vldb/RahmB01,DBLP:journals/sigmod/Noy04,DBLP:journals/aim/DoanH05,DBLP:journals/jwe/KonstantinouSM08,DBLP:journals/tkde/ShvaikoE13}
\citation{DBLP:journals/internet/FreitasCOO12}
\@writefile{toc}{\vspace  {2em}}
\@writefile{toc}{\contentsline {chapter}{\numberline {1}Introduction}{1}{chapter.10}}
\@writefile{lof}{\addvspace {10\p@ }}
\@writefile{lot}{\addvspace {10\p@ }}
\newlabel{Chapter1}{{1}{1}{Introduction}{chapter.10}{}}
\newlabel{chapter:introduction}{{1}{1}{Introduction}{chapter.10}{}}
\@writefile{lof}{\contentsline {figure}{\numberline {1.1}{\ignorespaces Snapshot of Linked Open Data Project in 2011.\relax }}{2}{figure.caption.11}}
\providecommand*\caption@xref[2]{\@setref\relax\@undefined{#1}}
\newlabel{fig:lod}{{1.1}{2}{Snapshot of Linked Open Data Project in 2011.\relax }{figure.caption.11}{}}
\@writefile{toc}{\contentsline {section}{\numberline {1.1}A Brief Overview of Instance Matching}{3}{section.12}}
\@writefile{toc}{\contentsline {subsection}{\numberline {1.1.1}What is instance matching?}{3}{subsection.13}}
\@writefile{toc}{\contentsline {subsection}{\numberline {1.1.2}How does it work?}{3}{subsection.24}}
\@writefile{toc}{\contentsline {subsection}{\numberline {1.1.3}Why is it challenging to do instance matching on Linked Data?}{4}{subsection.25}}
\@writefile{toc}{\contentsline {section}{\numberline {1.2}Thesis Scope and Outline}{4}{section.26}}
\@writefile{toc}{\contentsline {subsection}{\numberline {1.2.1}Towards Self-Linking Linked Data}{4}{subsection.27}}
\@writefile{toc}{\contentsline {subsection}{\numberline {1.2.2}SERIMI: Class-based Matching for Instance Matching Across Heterogeneous Datasets}{4}{subsection.28}}
\@writefile{toc}{\contentsline {subsection}{\numberline {1.2.3}Efficient and Effective On-the-fly Candidate Selection over Sparql Endpoints}{5}{subsection.29}}
\@writefile{toc}{\contentsline {subsection}{\numberline {1.2.4}Learning Edit-Distance Based String Transformation Rules From Examples}{5}{subsection.30}}
\@writefile{toc}{\contentsline {subsection}{\numberline {1.2.5}Exercises on Knowledge Based Acceleration}{6}{subsection.31}}
\@writefile{toc}{\contentsline {subsection}{\numberline {1.2.6}Conclusions}{7}{subsection.32}}
\citation{citeulike:1176986}
\citation{bizer_linked_2009}
\citation{DBLP:conf/www/Berners-LeeHLPPS08}
\citation{DBLP:conf/swap/dAquinSMAGLZ08}
\citation{DBLP:conf/www/AraujoS09}
\citation{DBLP:journals/ws/HoganHUKPD11}
\citation{DBLP:conf/semweb/HalpinHMMT10}
\citation{DBLP:conf/semweb/HuS10}
\citation{DBLP:conf/semweb/MillardGSS10}
\citation{DBLP:conf/rr/Hogan11}
\citation{DBLP:conf/aaaiss/JainHYVS10}
\citation{DBLP:journals/ws/HoganUHCPD12}
\citation{DBLP:conf/aaaiss/TummarelloD10}
\@writefile{toc}{\contentsline {chapter}{\numberline {2}Towards a self-linking Linked Data }{9}{chapter.33}}
\@writefile{lof}{\addvspace {10\p@ }}
\@writefile{lot}{\addvspace {10\p@ }}
\newlabel{chapter:vision}{{2}{9}{Towards a self-linking Linked Data}{chapter.33}{}}
\@writefile{toc}{\contentsline {section}{\numberline {2.1}Introduction}{9}{section.34}}
\citation{DBLP:conf/webdb/AraujoTDHS12}
\citation{DBLP:conf/semweb/EuzenatFHHMNRSSSST11}
\@writefile{lof}{\contentsline {figure}{\numberline {2.1}{\ignorespaces Overview of the structures of in self-linking Linked Data.\relax }}{11}{figure.caption.39}}
\newlabel{fig:organic}{{2.1}{11}{Overview of the structures of in self-linking Linked Data.\relax }{figure.caption.39}{}}
\@writefile{toc}{\contentsline {section}{\numberline {2.2}A General Architecture}{11}{section.40}}
\@writefile{toc}{\contentsline {subsection}{\numberline {2.2.1}Building a Self-Linking Linked Data}{11}{subsection.41}}
\citation{MichelsonK06}
\citation{DBLP:conf/webdb/IseleJB11}
\citation{DBLP:conf/wsdm/PapadakisINPN12}
\citation{DBLP:conf/webdb/IseleJB11}
\citation{fellegi_theory_1969,DBLP:conf/www/VolzBGK09}
\@writefile{toc}{\contentsline {subsection}{\numberline {2.2.2}Interlinking as a Query Problem}{12}{subsection.42}}
\citation{dorneles_approximate_2011}
\@writefile{lof}{\contentsline {figure}{\numberline {2.2}{\ignorespaces Interlinking Apparatus inside Linked Data Endpoints. \relax }}{14}{figure.caption.43}}
\newlabel{fig:interlinking}{{2.2}{14}{Interlinking Apparatus inside Linked Data Endpoints. \relax }{figure.caption.43}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {2.2.3}Self-linking Policies}{14}{subsection.44}}
\@writefile{toc}{\contentsline {subsection}{\numberline {2.2.4}SPARQL Extensions to Support Self-linking}{14}{subsection.45}}
\citation{DBLP:conf/semweb/HartigBF09}
\citation{DBLP:series/sci/GorlitzS11}
\citation{DBLP:conf/semweb/SchwarteHHSS11}
\citation{hu_bootstrapping_2011}
\citation{nikolov08}
\citation{DBLP:journals/pvldb/SuchanekAS11}
\citation{DBLP:conf/semweb/SongH11}
\citation{DBLP:conf/semweb/RongNXWYY12}
\@writefile{toc}{\contentsline {subsection}{\numberline {2.2.5}Standardization of Interlinking Algorithms}{15}{subsection.48}}
\@writefile{toc}{\contentsline {section}{\numberline {2.3}Proof of Concept}{15}{section.49}}
\citation{DBLP:conf/semweb/SchultzMIBB11}
\@writefile{toc}{\contentsline {section}{\numberline {2.4}Future Work}{16}{section.53}}
\citation{DBLP:journals/pvldb/IseleB12}
\citation{DBLP:conf/semweb/SongH11}
\citation{hu_bootstrapping_2011}
\citation{DBLP:conf/www/AlexanderCHZ09}
\@writefile{toc}{\contentsline {section}{\numberline {2.5}Conclusion}{17}{section.54}}
\@writefile{toc}{\contentsline {chapter}{\numberline {3}SERIMI: Class-based Matching for Instance Matching Across Heterogeneous Datasets}{19}{chapter.55}}
\@writefile{lof}{\addvspace {10\p@ }}
\@writefile{lot}{\addvspace {10\p@ }}
\newlabel{chapter:serimi}{{3}{19}{SERIMI: Class-based Matching for Instance Matching Across Heterogeneous Datasets}{chapter.55}{}}
\citation{DBLP:conf/ecai/EuzenatV04,DBLP:conf/iceis/LemeCBF09,DBLP:conf/semweb/NiuRZW11}
\citation{dorneles_approximate_2011}
\citation{fellegi_theory_1969}
\@writefile{lot}{\contentsline {table}{\numberline {3.1}{\ignorespaces Instances represented as RDF triples.\relax }}{20}{table.caption.58}}
\newlabel{table:examples}{{3.1}{20}{Instances represented as RDF triples.\relax }{table.caption.58}{}}
\@writefile{toc}{\contentsline {section}{\numberline {3.1}Introduction}{20}{section.56}}
\citation{Euzenat10,DBLP:conf/semweb/EuzenatFHHMNRSSSST11}
\@writefile{lof}{\contentsline {figure}{\numberline {3.1}{\ignorespaces Examples of instances that share a common attribute value.\relax }}{21}{figure.caption.60}}
\newlabel{fig:graphexample1}{{3.1}{21}{Examples of instances that share a common attribute value.\relax }{figure.caption.60}{}}
\citation{DBLP:journals/pvldb/SuchanekAS11}
\citation{DBLP:journals/pvldb/WangLYF11}
\@writefile{lof}{\contentsline {figure}{\numberline {3.2}{\ignorespaces Class-based matching.\relax }}{22}{figure.caption.61}}
\newlabel{fig:graphexample2}{{3.2}{22}{Class-based matching.\relax }{figure.caption.61}{}}
\@writefile{toc}{\contentsline {section}{\numberline {3.2}Preliminary Definitions}{23}{section.62}}
\newlabel{chapter:serimi2}{{3.2}{23}{Preliminary Definitions}{section.62}{}}
\newlabel{definition:featuredef}{{3.3}{23}{Features}{theorem.65}{}}
\@writefile{toc}{\contentsline {section}{\numberline {3.3}Overview of the Approach}{24}{section.67}}
\newlabel{chapter:serimi3}{{3.3}{24}{Overview of the Approach}{section.67}{}}
\@writefile{lof}{\contentsline {figure}{\numberline {3.3}{\ignorespaces The instance matching in SERIMI.\relax }}{24}{figure.caption.68}}
\newlabel{fig:overview}{{3.3}{24}{The instance matching in SERIMI.\relax }{figure.caption.68}{}}
\citation{hernandez_merge/purge_1995,mccallum_efficient_2000,papadakis_efficient_2011}
\citation{DBLP:journals/pvldb/ArasuCK09}
\citation{DBLP:journals/pvldb/WangLYF11,DBLP:journals/pvldb/SuchanekAS11}
\citation{DBLP:journals/pvldb/WangLYF11,DBLP:journals/pvldb/SuchanekAS11}
\citation{DBLP:journals/pvldb/SuchanekAS11,hu_bootstrapping_2011,Song:2011:AGD:2063016.2063058}
\citation{Song:2011:AGD:2063016.2063058}
\newlabel{eq:sim}{{3.2}{26}{Overview of the Approach}{equation.70}{}}
\citation{typifier}
\@writefile{toc}{\contentsline {section}{\numberline {3.4}Class-Based Matching}{27}{section.71}}
\newlabel{chapter:serimi4}{{3.4}{27}{Class-Based Matching}{section.71}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.4.1}Formal Definition}{27}{subsection.73}}
\newlabel{eq:opt}{{3.3}{27}{Class-based Matching (CBM)}{equation.75}{}}
\citation{DBLP:journals/eor/AlidaeeGKW07}
\@writefile{toc}{\contentsline {section}{\numberline {3.5}Class-based Matching: A Solution}{29}{section.78}}
\newlabel{chapter:serimi5}{{3.5}{29}{Class-based Matching: A Solution}{section.78}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.5.1}Basic Solution}{29}{subsection.79}}
\newlabel{eq:urds}{{3.5}{30}{Basic Solution}{equation.80}{}}
\citation{tversky1977features}
\@writefile{lof}{\contentsline {figure}{\numberline {3.4}{\ignorespaces (a) Class-based similarity score for the candidate $t_{11}$ is obtained by comparing it with $C(s_2)$ and $C(s_3)$, (b) the score for $t_{11}$ and (c) the scores for all other candidates.\relax }}{31}{figure.caption.83}}
\newlabel{fig:computation}{{3.4}{31}{(a) Class-based similarity score for the candidate $t_{11}$ is obtained by comparing it with $C(s_2)$ and $C(s_3)$, (b) the score for $t_{11}$ and (c) the scores for all other candidates.\relax }{figure.caption.83}{}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {1}{\ignorespaces SimScores($C(S)$).\relax }}{32}{algorithm.84}}
\newlabel{alg:sim}{{1}{32}{SimScores($C(S)$).\relax }{ALC@unique.104}{}}
\newlabel{eq:setsimsr}{{3.9}{32}{Basic Solution}{equation.106}{}}
\newlabel{theorem:t1}{{3.7}{33}{}{theorem.107}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.5.2}Reducing the Number of Comparisons}{33}{subsection.108}}
\newlabel{sec:setreduction}{{3.5.2}{33}{Reducing the Number of Comparisons}{subsection.108}{}}
\citation{DBLP:journals/pvldb/WangLYF11,DBLP:conf/vldb/ChaudhuriCGK07}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.5.3}Selecting the Threshold}{34}{subsection.129}}
\newlabel{sec:threshold}{{3.5.3}{34}{Selecting the Threshold}{subsection.129}{}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {2}{\ignorespaces CandidateSetsReduction($C(S)$).\relax }}{35}{algorithm.114}}
\newlabel{alg:setreduction}{{2}{35}{CandidateSetsReduction($C(S)$).\relax }{ALC@unique.128}{}}
\citation{chauvenet}
\citation{DBLP:journals/pvldb/SuchanekAS11}
\citation{DBLP:journals/pvldb/WangLYF11}
\@writefile{toc}{\contentsline {section}{\numberline {3.6}Evaluation}{36}{section.154}}
\newlabel{chapter:serimi6}{{3.6}{36}{Evaluation}{section.154}{}}
\newlabel{sec:evaluation}{{3.6}{36}{Evaluation}{section.154}{}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {3}{\ignorespaces ThresholdBasedSelection($C$).\relax }}{37}{algorithm.135}}
\newlabel{alg:delta}{{3}{37}{ThresholdBasedSelection($C$).\relax }{ALC@unique.153}{}}
\@writefile{lot}{\contentsline {table}{\numberline {3.2}{\ignorespaces Number of triples in each dataset.\relax }}{38}{table.caption.156}}
\newlabel{table:datadescription}{{3.2}{38}{Number of triples in each dataset.\relax }{table.caption.156}{}}
\@writefile{lot}{\contentsline {table}{\numberline {3.3}{\ignorespaces Dataset pairs representing matching tasks, number of comparable predicates (CP) for every task, number of correct matches (Match), number of candidate matches obtained from candidate selection (Cand), mean (MEAN) and standard deviation (STDV) of the number of candidates per instance.\relax }}{38}{table.caption.159}}
\newlabel{table:mappingpairs}{{3.3}{38}{Dataset pairs representing matching tasks, number of comparable predicates (CP) for every task, number of correct matches (Match), number of candidate matches obtained from candidate selection (Cand), mean (MEAN) and standard deviation (STDV) of the number of candidates per instance.\relax }{table.caption.159}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.6.1}Task Analysis}{39}{subsection.160}}
\newlabel{eq:tc}{{3.14}{40}{Task Analysis}{equation.165}{}}
\@writefile{lof}{\contentsline {figure}{\numberline {3.5}{\ignorespaces F1 for tasks with increasing complexity.\relax }}{41}{figure.caption.166}}
\newlabel{fig:taskvsf1}{{3.5}{41}{F1 for tasks with increasing complexity.\relax }{figure.caption.166}{}}
\@writefile{lof}{\contentsline {figure}{\numberline {3.6}{\ignorespaces Coverage and discriminative power of predicates in the target datasets.\relax }}{42}{figure.caption.167}}
\newlabel{fig:coverage}{{3.6}{42}{Coverage and discriminative power of predicates in the target datasets.\relax }{figure.caption.167}{}}
\@writefile{lof}{\contentsline {figure}{\numberline {3.7}{\ignorespaces Coverage of predicates in the sources.\relax }}{43}{figure.caption.168}}
\newlabel{fig:sourcecoverage}{{3.7}{43}{Coverage of predicates in the sources.\relax }{figure.caption.168}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.6.2}SERIMI Configurations}{44}{subsection.169}}
\@writefile{lof}{\contentsline {figure}{\numberline {3.8}{\ignorespaces Time performance; tasks are ordered according to the number of triples in the candidate sets.\relax }}{46}{figure.caption.170}}
\newlabel{fig:taskvstime}{{3.8}{46}{Time performance; tasks are ordered according to the number of triples in the candidate sets.\relax }{figure.caption.170}{}}
\@writefile{lot}{\contentsline {table}{\numberline {3.4}{\ignorespaces Time performance for different SERIMI configurations, in seconds.\relax }}{47}{table.caption.171}}
\newlabel{table:timetable}{{3.4}{47}{Time performance for different SERIMI configurations, in seconds.\relax }{table.caption.171}{}}
\@writefile{lot}{\contentsline {table}{\numberline {3.5}{\ignorespaces F1 performance for different SERIMI configurations.\relax }}{48}{table.caption.172}}
\newlabel{table:tablef1s}{{3.5}{48}{F1 performance for different SERIMI configurations.\relax }{table.caption.172}{}}
\citation{Euzenat10}
\citation{DBLP:conf/www/HuCQ11}
\citation{DBLP:conf/semweb/EuzenatFHHMNRSSSST11}
\citation{DBLP:journals/pvldb/SuchanekAS11}
\citation{DBLP:journals/pvldb/WangLYF11}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.6.3}SERIMI vs. Alternative Approaches}{49}{subsection.173}}
\@writefile{lot}{\contentsline {table}{\numberline {3.6}{\ignorespaces F1 performance for SERIMI, OC2010, RIMON, OC2012 over OAEI 2010 data; some results were not available for OC2010, RIMON OC2012.\relax }}{49}{table.caption.174}}
\newlabel{table:oaei2010oc}{{3.6}{49}{F1 performance for SERIMI, OC2010, RIMON, OC2012 over OAEI 2010 data; some results were not available for OC2010, RIMON OC2012.\relax }{table.caption.174}{}}
\@writefile{lot}{\contentsline {table}{\numberline {3.7}{\ignorespaces F1 performance for OAEI 2011.\relax }}{50}{table.caption.175}}
\newlabel{table:oaei2012table}{{3.7}{50}{F1 performance for OAEI 2011.\relax }{table.caption.175}{}}
\citation{melnik_similarity_2002,spaccapietra_survey_2005,bernstein_discovering_2009}
\citation{hu_bootstrapping_2011}
\citation{DBLP:journals/pvldb/SuchanekAS11}
\citation{DBLP:conf/ijcai/CohenRF03}
\citation{budanitsky_evaluating_2006,han_structural_2010}
\citation{DBLP:conf/semweb/NiuRZW11}
\citation{DBLP:conf/esws/NikolovdM12}
\citation{DBLP:journals/pvldb/WangLYF11}
\citation{DBLP:conf/semweb/RongNXWYY12}
\citation{DBLP:conf/vldb/ChaudhuriCGK07}
\citation{DBLP:conf/semweb/NiuRZW11}
\citation{DBLP:conf/semweb/WangZHZLQT10}
\citation{Song:2011:AGD:2063016.2063058}
\@writefile{toc}{\contentsline {section}{\numberline {3.7}Related Work}{51}{section.176}}
\newlabel{chapter:serimi7}{{3.7}{51}{Related Work}{section.176}{}}
\citation{DBLP:conf/cikm/BohmMNW12}
\@writefile{toc}{\contentsline {section}{\numberline {3.8}Conclusion}{52}{section.177}}
\newlabel{chapter:serimi8}{{3.8}{52}{Conclusion}{section.177}{}}
\@writefile{toc}{\contentsline {chapter}{\numberline {4}Efficient and Effective On-the-fly Candidate Selection over Sparql Endpoints}{53}{chapter.178}}
\@writefile{lof}{\addvspace {10\p@ }}
\@writefile{lot}{\addvspace {10\p@ }}
\newlabel{chapter:sonda}{{4}{53}{Efficient and Effective On-the-fly Candidate Selection over Sparql Endpoints}{chapter.178}{}}
\citation{DBLP:conf/www/JaffriGM08,DBLP:conf/www/VolzBGK09,DBLP:journals/ijswis/FerraraNS11,DBLP:conf/www/HuCQ11,DBLP:books/daglib/0030287}
\citation{hernandez_merge/purge_1995,MichelsonK06,elmagarmid_duplicate_2007}
\citation{DBLP:conf/semweb/SongH11,MaurouxHJAM09}
\citation{DBLP:series/synthesis/2011Gal}
\@writefile{toc}{\contentsline {section}{\numberline {4.1}Introduction}{54}{section.179}}
\citation{DBLP:conf/rweb/Parsia06,DBLP:conf/icde/LabordaC06,DBLP:conf/esws/DietzoldA07,DBLP:conf/aswc/CornoCCV08}
\citation{DBLP:conf/semweb/GorlitzS11,DBLP:conf/semweb/MontoyaVCRA12}
\citation{DBLP:conf/webdb/AraujoTDHS12}
\@writefile{toc}{\contentsline {section}{\numberline {4.2}Overview}{57}{section.204}}
\newlabel{chapter:sonda2}{{4.2}{57}{Overview}{section.204}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.2.1}Problem - Find Candidate Matches}{57}{subsection.207}}
\citation{DBLP:conf/vldb/ChaudhuriCGK07}
\citation{DBLP:conf/semweb/SongH11}
\citation{DBLP:conf/wsdm/PapadakisINF11}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.2.2}Existing Solutions}{59}{subsection.210}}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.2.3}Sonda}{59}{subsection.211}}
\citation{DBLP:books/daglib/0023820}
\citation{DBLP:journals/tods/PerezAG09}
\@writefile{lof}{\contentsline {figure}{\numberline {4.1}{\ignorespaces The process of learning queries and executing them. \relax }}{60}{figure.caption.212}}
\newlabel{fig:template}{{4.1}{60}{The process of learning queries and executing them. \relax }{figure.caption.212}{}}
\@writefile{toc}{\contentsline {section}{\numberline {4.3}Learning Queries}{61}{section.213}}
\newlabel{chapter:sonda3}{{4.3}{61}{Learning Queries}{section.213}{}}
\citation{DBLP:conf/semweb/SongH11}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.3.1}Finding Comparable Key Pairs}{62}{subsection.233}}
\citation{DBLP:series/synthesis/2011Gal}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.3.2}Constructing Attribute Components}{63}{subsection.235}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {4}{\ignorespaces AttributeComponentQueries($S$, $G_S$, $G_T$).\relax }}{64}{algorithm.236}}
\newlabel{alg:buildattributequeries}{{4}{64}{AttributeComponentQueries($S$, $G_S$, $G_T$).\relax }{ALC@unique.250}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.3.3}Learning Class Components}{64}{subsection.251}}
\citation{DBLP:conf/soda/CarrDKM00}
\@writefile{toc}{\contentsline {section}{\numberline {4.4}Executing Optimal Queries}{65}{section.252}}
\newlabel{chapter:sonda4}{{4.4}{65}{Executing Optimal Queries}{section.252}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.4.1}Estimating Metrics for Query Optimality}{66}{subsection.254}}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.4.2}Optimal Queries for One Instance}{67}{subsection.259}}
\citation{DBLP:books/mk/WittenF99,DBLP:conf/nips/NgJ01}
\citation{INSR:INSR385}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.4.3}Optimization Process for All Instances}{69}{subsection.263}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {5}{\ignorespaces CandidateSelection($S$, $G_S$, $G_T$, $\beta $, $n$).\relax }}{70}{algorithm.264}}
\newlabel{alg:candidateselection}{{5}{70}{CandidateSelection($S$, $G_S$, $G_T$, $\beta $, $n$).\relax }{ALC@unique.274}{}}
\@writefile{lof}{\contentsline {figure}{\numberline {4.2}{\ignorespaces All queries are evaluated in the Sorting phase (black and dashed circles stand for optimal and ``unnecessary'' queries, respectively), while fewer queries are evaluated in the Learning and Predicting phases (white circles denote unevaluated queries).\relax }}{70}{figure.caption.275}}
\newlabel{fig:branch}{{4.2}{70}{All queries are evaluated in the Sorting phase (black and dashed circles stand for optimal and ``unnecessary'' queries, respectively), while fewer queries are evaluated in the Learning and Predicting phases (white circles denote unevaluated queries).\relax }{figure.caption.275}{}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {6}{\ignorespaces SortingPhase($S$, $Q_S$, $\beta $).\relax }}{71}{algorithm.276}}
\newlabel{alg:sortingphase}{{6}{71}{SortingPhase($S$, $Q_S$, $\beta $).\relax }{ALC@unique.288}{}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {7}{\ignorespaces LearningPhase($S$, $Q_S$, $\Gamma $,$n$).\relax }}{71}{algorithm.289}}
\newlabel{alg:learningphase}{{7}{71}{LearningPhase($S$, $Q_S$, $\Gamma $,$n$).\relax }{ALC@unique.305}{}}
\citation{DBLP:journals/jods/EuzenatMSSS11}
\citation{DBLP:conf/semweb/SongH11}
\@writefile{loa}{\contentsline {algorithm}{\numberline {8}{\ignorespaces PredictingPhase($S$, $Q_S$, $\Gamma $).\relax }}{72}{algorithm.306}}
\newlabel{alg:predictingphase}{{8}{72}{PredictingPhase($S$, $Q_S$, $\Gamma $).\relax }{ALC@unique.318}{}}
\@writefile{toc}{\contentsline {section}{\numberline {4.5}Evaluation}{72}{section.319}}
\newlabel{chapter:sonda5}{{4.5}{72}{Evaluation}{section.319}{}}
\citation{papadakis_efficient_2011}
\citation{DBLP:conf/semweb/SongH11}
\@writefile{lot}{\contentsline {table}{\numberline {4.1}{\ignorespaces Results of the three systems over all pairs of datasets, where Queries denotes the total number of queries issued by the system, Queries/Instance (Q/I) denotes the amount of queries evaluated per instance, and Learning(s) and Search(s) stands for the time needed for learning queries and executing them, respectively.\relax }}{75}{table.caption.322}}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.5.1}Candidate Selection Results}{77}{subsection.324}}
\@writefile{lof}{\contentsline {figure}{\numberline {4.3}{\ignorespaces F1 for Sonda-A, S-agnostic and S-based for query limits 10, 30, 50 and 100.\relax }}{80}{figure.caption.325}}
\newlabel{fig:limitsagnostic}{{4.3}{80}{F1 for Sonda-A, S-agnostic and S-based for query limits 10, 30, 50 and 100.\relax }{figure.caption.325}{}}
\@writefile{lof}{\contentsline {figure}{\numberline {4.4}{\ignorespaces Execution time for Sonda-A, S-agnostic and S-based for query limits 10, 30, 50 and 100.\relax }}{80}{figure.caption.326}}
\newlabel{fig:limitsbased}{{4.4}{80}{Execution time for Sonda-A, S-agnostic and S-based for query limits 10, 30, 50 and 100.\relax }{figure.caption.326}{}}
\citation{serimi}
\citation{DBLP:conf/semweb/WangZHZLQT10}
\citation{DBLP:conf/semweb/HuCCQ10}
\@writefile{lof}{\contentsline {figure}{\numberline {4.5}{\ignorespaces Percentages of query types executed by Sonda-A per task.\relax }}{81}{figure.caption.327}}
\newlabel{fig:frequency}{{4.5}{81}{Percentages of query types executed by Sonda-A per task.\relax }{figure.caption.327}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.5.2}Instance Matching Results}{81}{subsection.328}}
\@writefile{lot}{\contentsline {table}{\numberline {4.2}{\ignorespaces Sonda+SERIMI compared to other OAEI 2010 published results.\relax }}{82}{table.caption.330}}
\@writefile{toc}{\contentsline {subsection}{\numberline {4.5.3}Utility of the Approach}{82}{subsection.331}}
\newlabel{eq:tradeoff_condition}{{4.1}{82}{Utility of the Approach}{equation.332}{}}
\newlabel{eq:tradeoff_condition2}{{4.2}{82}{Utility of the Approach}{equation.333}{}}
\citation{hernandez_merge/purge_1995}
\citation{DBLP:conf/wsdm/PapadakisINF11}
\citation{DBLP:conf/wsdm/PapadakisINPN12}
\citation{DBLP:conf/semweb/SongH11}
\citation{DBLP:conf/semweb/SongH11,hu_bootstrapping_2011,DBLP:journals/tkde/LiTLL09,DBLP:conf/vldb/ChaudhuriCGK07}
\citation{DBLP:journals/jair/BhattacharyaG07}
\citation{DBLP:journals/jair/BhattacharyaG07}
\citation{DBLP:journals/jair/BhattacharyaG07}
\@writefile{toc}{\contentsline {section}{\numberline {4.6}Related Work}{83}{section.334}}
\newlabel{chapter:sonda6}{{4.6}{83}{Related Work}{section.334}{}}
\citation{DBLP:journals/pvldb/MetwallyF12}
\citation{DBLP:conf/webdb/AraujoTDHS12}
\citation{DBLP:conf/www/HerzigT12}
\@writefile{toc}{\contentsline {section}{\numberline {4.7}Conclusions}{84}{section.335}}
\newlabel{chapter:sonda7}{{4.7}{84}{Conclusions}{section.335}{}}
\@writefile{toc}{\contentsline {chapter}{\numberline {5}Learning Edit-Distance Based String Transformation Rules From Examples}{85}{chapter.336}}
\@writefile{lof}{\addvspace {10\p@ }}
\@writefile{lot}{\addvspace {10\p@ }}
\newlabel{chapter:string}{{5}{85}{Learning Edit-Distance Based String Transformation Rules From Examples}{chapter.336}{}}
\citation{DBLP:journals/expert/Fayyad96,DBLP:journals/debu/RahmD00}
\citation{DBLP:conf/popl/Gulwani11}
\citation{DBLP:journals/cacm/GulwaniHS12}
\citation{DBLP:journals/cacm/GulwaniHS12}
\citation{DBLP:journals/aim/Lau09}
\@writefile{lot}{\contentsline {table}{\numberline {5.1}{\ignorespaces Examples of String Transformations\relax }}{86}{table.caption.340}}
\newlabel{table:ruleexamples}{{5.1}{86}{Examples of String Transformations\relax }{table.caption.340}{}}
\@writefile{toc}{\contentsline {section}{\numberline {5.1}Introduction}{86}{section.337}}
\citation{DBLP:journals/pvldb/ArasuCK09}
\citation{DBLP:conf/icai/MichelsonK09}
\citation{DBLP:conf/emnlp/OkazakiTAT08}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.1.1}Overview and Contributions}{88}{subsection.341}}
\@writefile{toc}{\contentsline {section}{\numberline {5.2}Learning Transformations}{89}{section.342}}
\newlabel{sec:problem}{{5.2}{89}{Learning Transformations}{section.342}{}}
\citation{levelshtein-66-binary}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.2.1}Preliminary Definitions}{90}{subsection.343}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.2.2}Transformation Rules}{91}{subsection.351}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.2.3}Generalization of Transformation Rules}{92}{subsection.353}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.2.4}Learning Problem}{95}{subsection.359}}
\@writefile{toc}{\contentsline {section}{\numberline {5.3}Rule Learner Algorithm}{96}{section.365}}
\newlabel{sec:algorithm}{{5.3}{96}{Rule Learner Algorithm}{section.365}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.3.1}Rule Learning}{96}{subsection.366}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.3.2}Relative Position Algorithm}{96}{subsection.367}}
\@writefile{lof}{\contentsline {figure}{\numberline {5.1}{\ignorespaces String $u=``Noia, La"$, $u^c=\textbf  {zulllpsulz}$, $E_2(u^c)=\{\textbf  {zu, ul, ll, ll, lp, ps, su, ul, lz}\}$, $w_{e_1}=\textbf  {zulllpsu}$ and $w_{e_9}=\textbf  {ulz}$.\relax }}{97}{figure.caption.368}}
\newlabel{fig:diagram}{{5.1}{97}{String $u=``Noia, La"$, $u^c=\textbf {zulllpsulz}$, $E_2(u^c)=\{\textbf {zu, ul, ll, ll, lp, ps, su, ul, lz}\}$, $w_{e_1}=\textbf {zulllpsu}$ and $w_{e_9}=\textbf {ulz}$.\relax }{figure.caption.368}{}}
\newlabel{eq:relative}{{5.3}{97}{Relative Position Algorithm}{equation.369}{}}
\newlabel{eq:fremean}{{5.4}{97}{Relative Position Algorithm}{equation.370}{}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {9}{\ignorespaces RelativePosition($u$, $i$, $n$).\relax }}{98}{algorithm.372}}
\newlabel{alg:relativeposition}{{9}{98}{RelativePosition($u$, $i$, $n$).\relax }{ALC@unique.392}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.3.3}Permutation Rule Learner}{98}{subsection.393}}
\newlabel{eq:permutation}{{5.6}{99}{Permutation Rule Learner}{equation.394}{}}
\citation{2009design}
\@writefile{loa}{\contentsline {algorithm}{\numberline {10}{\ignorespaces Sorting($t_c$, $v$).\relax }}{100}{algorithm.397}}
\newlabel{alg:ss}{{10}{100}{Sorting($t_c$, $v$).\relax }{ALC@unique.416}{}}
\newlabel{lemma:ss}{{5.15}{100}{}{theorem.417}{}}
\citation{DBLP:books/daglib/0023376}
\citation{DBLP:books/cu/Gusfield1997}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.3.4}Insertions and Deletions Rule Learner}{101}{subsection.421}}
\@writefile{lof}{\contentsline {figure}{\numberline {5.2}{\ignorespaces All common substrings between $u_p = ``Aug\ 06,\ 2013"$ and $v = ``06/08/13"$.\relax }}{101}{figure.caption.423}}
\newlabel{fig:permutation}{{5.2}{101}{All common substrings between $u_p = ``Aug\ 06,\ 2013"$ and $v = ``06/08/13"$.\relax }{figure.caption.423}{}}
\citation{DBLP:books/daglib/0019552}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.3.5}Update Rule Learner }{102}{subsection.424}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.3.6}Discussion}{103}{subsection.425}}
\@writefile{toc}{\contentsline {section}{\numberline {5.4}Rule Selector Method}{103}{section.426}}
\newlabel{sec:ruleselector}{{5.4}{103}{Rule Selector Method}{section.426}{}}
\@writefile{toc}{\contentsline {section}{\numberline {5.5}Evaluation}{104}{section.427}}
\newlabel{sec:evaluations}{{5.5}{104}{Evaluation}{section.427}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.5.1}Data}{104}{subsection.428}}
\citation{Ziegler:2005:IRL:1060745.1060754}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.5.2}Evaluation Metric }{106}{subsection.431}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.5.3}Rule Coverage}{107}{subsection.433}}
\@writefile{lot}{\contentsline {table}{\numberline {5.2}{\ignorespaces  Maximal Coverage Per Task \relax }}{107}{table.caption.434}}
\newlabel{table:rulecoverage}{{5.2}{107}{Maximal Coverage Per Task \relax }{table.caption.434}{}}
\@writefile{lot}{\contentsline {table}{\numberline {5.3}{\ignorespaces  The first 7 rules with the highest coverage for the Abbreviations dataset using $E_2$. \relax }}{107}{table.caption.435}}
\newlabel{table:coverageabbreviations}{{5.3}{107}{The first 7 rules with the highest coverage for the Abbreviations dataset using $E_2$. \relax }{table.caption.435}{}}
\@writefile{lot}{\contentsline {table}{\numberline {5.4}{\ignorespaces  The first 11 rules with the highest coverage for the Books dataset using $E_2$. \relax }}{108}{table.caption.436}}
\newlabel{table:coveragebooks}{{5.4}{108}{The first 11 rules with the highest coverage for the Books dataset using $E_2$. \relax }{table.caption.436}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.5.4}Rule Selector Accuracy}{108}{subsection.437}}
\citation{DBLP:conf/uai/ChengG99}
\@writefile{lot}{\contentsline {table}{\numberline {5.5}{\ignorespaces Abbreviations Examples\relax }}{109}{table.caption.438}}
\newlabel{table:abbreviationsexamples}{{5.5}{109}{Abbreviations Examples\relax }{table.caption.438}{}}
\@writefile{lot}{\contentsline {table}{\numberline {5.6}{\ignorespaces Book Titles Examples\relax }}{109}{table.caption.439}}
\newlabel{table:bookexamples}{{5.6}{109}{Book Titles Examples\relax }{table.caption.439}{}}
\@writefile{lot}{\contentsline {table}{\numberline {5.7}{\ignorespaces Song Examples\relax }}{109}{table.caption.440}}
\newlabel{table:songexamples}{{5.7}{109}{Song Examples\relax }{table.caption.440}{}}
\citation{1183917,DBLP:journals/aai/RatanamahatanaG03}
\@writefile{lot}{\contentsline {table}{\numberline {5.8}{\ignorespaces Dates Examples\relax }}{110}{table.caption.441}}
\newlabel{table:datesexamples}{{5.8}{110}{Dates Examples\relax }{table.caption.441}{}}
\@writefile{lot}{\contentsline {table}{\numberline {5.9}{\ignorespaces Accuracy of the Rule Algorithm With $E_2$\relax }}{110}{table.caption.442}}
\newlabel{table:results}{{5.9}{110}{Accuracy of the Rule Algorithm With $E_2$\relax }{table.caption.442}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.5.5}Runtime Cost}{110}{subsection.443}}
\citation{DBLP:conf/popl/Gulwani11,DBLP:journals/cacm/GulwaniHS12}
\@writefile{lof}{\contentsline {figure}{\numberline {5.3}{\ignorespaces Learning time varying the sample size for the Books dataset. We considered 4 runs for each sample size.\relax }}{111}{figure.caption.444}}
\newlabel{fig:time}{{5.3}{111}{Learning time varying the sample size for the Books dataset. We considered 4 runs for each sample size.\relax }{figure.caption.444}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.5.6}Performance Comparison}{111}{subsection.445}}
\@writefile{lot}{\contentsline {table}{\numberline {5.10}{\ignorespaces Average accuracy per systems.\relax }}{112}{table.caption.446}}
\newlabel{table:comparisonflashfill}{{5.10}{112}{Average accuracy per systems.\relax }{table.caption.446}{}}
\citation{DBLP:journals/pvldb/ArasuCK09}
\citation{DBLP:conf/icai/MichelsonK09}
\citation{DBLP:conf/dexa/PatroW11}
\citation{DBLP:conf/kdd/TejadaKM02}
\citation{DBLP:conf/emnlp/OkazakiTAT08}
\citation{Bouchard04thetrade-off}
\citation{DBLP:conf/popl/Gulwani11}
\citation{DBLP:journals/pvldb/SinghG12}
\citation{DBLP:conf/aaai/WuSK12}
\@writefile{toc}{\contentsline {section}{\numberline {5.6}Related Work}{113}{section.448}}
\newlabel{sec:relatedwork}{{5.6}{113}{Related Work}{section.448}{}}
\citation{conf/acl/SattaH97}
\citation{DBLP:conf/vldb/RamanH01}
\@writefile{toc}{\contentsline {section}{\numberline {5.7}Conclusions}{114}{section.449}}
\newlabel{sec:conclusion}{{5.7}{114}{Conclusions}{section.449}{}}
\@writefile{toc}{\contentsline {chapter}{\numberline {6}Exercises on Knowledge Based Acceleration}{117}{chapter.450}}
\@writefile{lof}{\addvspace {10\p@ }}
\@writefile{lot}{\addvspace {10\p@ }}
\newlabel{chapter:trec}{{6}{117}{Exercises on Knowledge Based Acceleration}{chapter.450}{}}
\citation{trec-kba-overview-2012}
\@writefile{toc}{\contentsline {section}{\numberline {6.1}Introduction}{118}{section.451}}
\@writefile{toc}{\contentsline {section}{\numberline {6.2}TREC-KBA Task Overview}{119}{section.452}}
\newlabel{chapter:trec2}{{6.2}{119}{TREC-KBA Task Overview}{section.452}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {6.2.1}Data Overview}{119}{subsection.453}}
\@writefile{lot}{\contentsline {table}{\numberline {6.1}{\ignorespaces Entities Names\relax }}{119}{table.caption.454}}
\newlabel{table:entitiestrec}{{6.1}{119}{Entities Names\relax }{table.caption.454}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {6.2.2}TREC-KBA Baseline}{120}{subsection.456}}
\newlabel{eq:baselinetrec}{{6.1}{120}{TREC-KBA Baseline}{equation.457}{}}
\@writefile{toc}{\contentsline {section}{\numberline {6.3}Approaches}{120}{section.458}}
\newlabel{chapter:trec3}{{6.3}{120}{Approaches}{section.458}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {6.3.1}Entity Representation}{120}{subsection.459}}
\@writefile{toc}{\contentsline {subsection}{\numberline {6.3.2}Prefix-Suffix Learning Approach}{121}{subsection.474}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {11}{\ignorespaces LearningPrefixSuffixStrings($e$, $\Delta ^{+}$,$\Delta ^{-}$, $K$).\relax }}{122}{algorithm.475}}
\newlabel{alg:prefixsuffix}{{11}{122}{LearningPrefixSuffixStrings($e$, $\Delta ^{+}$,$\Delta ^{-}$, $K$).\relax }{ALC@unique.492}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {6.3.3}Disambiguator Approach}{122}{subsection.493}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {12}{\ignorespaces DisambiguatorCentralAnnotator($E$, $D$, $L$).\relax }}{124}{algorithm.542}}
\newlabel{alg:disambiguator}{{12}{124}{DisambiguatorCentralAnnotator($E$, $D$, $L$).\relax }{ALC@unique.562}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {6.3.4}Language Model Approach}{125}{subsection.563}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {13}{\ignorespaces LanguageModelTraining($E$, $\Delta ^+$).\relax }}{125}{algorithm.566}}
\newlabel{alg:languagemodel}{{13}{125}{LanguageModelTraining($E$, $\Delta ^+$).\relax }{ALC@unique.580}{}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {14}{\ignorespaces LanguageModelCentralAnnotator($E$, $D$, $LM$).\relax }}{126}{algorithm.581}}
\newlabel{alg:languagemodelannotator}{{14}{126}{LanguageModelCentralAnnotator($E$, $D$, $LM$).\relax }{ALC@unique.596}{}}
\@writefile{toc}{\contentsline {section}{\numberline {6.4}Evaluations and Discussions}{126}{section.597}}
\newlabel{chapter:trec4}{{6.4}{126}{Evaluations and Discussions}{section.597}{}}
\citation{trec-kba-overview-2012}
\@writefile{lot}{\contentsline {table}{\numberline {6.2}{\ignorespaces Precision (P), Recall (R) and F1 for each evaluated approach, w.r.t central documents.\relax }}{127}{table.caption.598}}
\newlabel{table:resultstrec}{{6.2}{127}{Precision (P), Recall (R) and F1 for each evaluated approach, w.r.t central documents.\relax }{table.caption.598}{}}
\@writefile{toc}{\contentsline {section}{\numberline {6.5}Conclusion}{128}{section.599}}
\newlabel{chapter:trec5}{{6.5}{128}{Conclusion}{section.599}{}}
\@writefile{toc}{\contentsline {chapter}{\numberline {7}Conclusions}{129}{chapter.600}}
\@writefile{lof}{\addvspace {10\p@ }}
\@writefile{lot}{\addvspace {10\p@ }}
\newlabel{chapter:conclusions}{{7}{129}{Conclusions}{chapter.600}{}}
\@writefile{toc}{\contentsline {section}{\numberline {7.1}Research Questions}{129}{section.601}}
\@writefile{toc}{\contentsline {subsection}{\numberline {7.1.1}Towards Self-Linking Linked Data}{129}{subsection.602}}
\@writefile{toc}{\contentsline {subsection}{\numberline {7.1.2}SERIMI: Class-based Matching for Instance Matching Across Heterogeneous Datasets}{129}{subsection.603}}
\@writefile{toc}{\contentsline {subsection}{\numberline {7.1.3}Efficient and Effective On-the-fly Candidate Selection over Sparql Endpoints}{130}{subsection.604}}
\citation{DBLP:conf/semweb/AuerBKLCI07,DBLP:journals/ws/BizerLKABCH09,DBLP:conf/esws/KobilarovSROSSBL09}
\@writefile{toc}{\contentsline {subsection}{\numberline {7.1.4}Learning Edit-Distance Based String Transformation Rules From Examples}{131}{subsection.607}}
\@writefile{toc}{\contentsline {subsection}{\numberline {7.1.5}Exercises on Knowledge Based Acceleration}{132}{subsection.608}}
\@writefile{toc}{\contentsline {section}{\numberline {7.2}Future Research}{133}{section.609}}
\@writefile{toc}{\vspace  {2em}}
\citation{tversky1977features}
\@writefile{toc}{\contentsline {chapter}{\numberline {A}Jaccard Vs. FSSim}{135}{appendix.610}}
\@writefile{lof}{\addvspace {10\p@ }}
\@writefile{lot}{\addvspace {10\p@ }}
\newlabel{AppendixA}{{A}{135}{Jaccard Vs. FSSim}{appendix.610}{}}
\newlabel{eq:ratiomodel}{{A.1}{135}{Jaccard Vs. FSSim}{equation.611}{}}
\newlabel{eq:proof1}{{A}{135}{Jaccard Vs. FSSim}{equation.611}{}}
\newlabel{lemma:lemma2}{{A.1}{135}{}{theorem.612}{}}
\@writefile{toc}{\vspace  {2em}}
\bibstyle{unsrtnat}
\bibdata{Bibliography}
\bibcite{dorneles_approximate_2011}{{1}{2011}{{Dorneles et~al.}}{{Dorneles, Gon\c {c}alves, and dos Santos~Mello}}}
\bibcite{elmagarmid_duplicate_2007}{{2}{2007}{{Elmagarmid et~al.}}{{Elmagarmid, Ipeirotis, and Verykios}}}
\bibcite{spaccapietra_survey_2005}{{3}{2005}{{Shvaiko and Euzenat}}{{}}}
\bibcite{citeulike:1176986}{{4}{2001}{{Berners-Lee et~al.}}{{Berners-Lee, Hendler, and Lassila}}}
\bibcite{bizer_linked_2009}{{5}{2009{}}{{Bizer et~al.}}{{Bizer, Heath, and Berners-Lee}}}
\bibcite{DBLP:books/daglib/0030287}{{6}{2012}{{Christen}}{{}}}
\bibcite{DBLP:journals/dke/KopckeR10}{{7}{2010}{{K{\"o}pcke and Rahm}}{{}}}
\bibcite{DBLP:journals/vldb/RahmB01}{{8}{2001}{{Rahm and Bernstein}}{{}}}
\bibcite{DBLP:journals/sigmod/Noy04}{{9}{2004}{{Noy}}{{}}}
\bibcite{DBLP:journals/aim/DoanH05}{{10}{2005}{{Doan and Halevy}}{{}}}
\bibcite{DBLP:journals/jwe/KonstantinouSM08}{{11}{2008}{{Konstantinou et~al.}}{{Konstantinou, Spanos, and Mitrou}}}
\@writefile{toc}{\contentsline {chapter}{Bibliography}{137}{dummy.613}}
\newlabel{Bibliography}{{6}{137}{Jaccard Vs. FSSim}{dummy.613}{}}
\bibcite{DBLP:journals/tkde/ShvaikoE13}{{12}{2013}{{Shvaiko and Euzenat}}{{}}}
\bibcite{DBLP:journals/internet/FreitasCOO12}{{13}{2012}{{Freitas et~al.}}{{Freitas, Curry, Oliveira, and O'Riain}}}
\bibcite{DBLP:conf/www/Berners-LeeHLPPS08}{{14}{2008}{{Berners-Lee et~al.}}{{Berners-Lee, Hollenbach, Lu, Presbrey, Prud'hommeaux, and Schraefel}}}
\bibcite{DBLP:conf/swap/dAquinSMAGLZ08}{{15}{2008}{{d'Aquin et~al.}}{{d'Aquin, Sabou, Motta, Angeletou, Gridinoc, Lopez, and Zablith}}}
\bibcite{DBLP:conf/www/AraujoS09}{{16}{2009}{{Ara{\'u}jo and Schwabe}}{{}}}
\bibcite{DBLP:journals/ws/HoganHUKPD11}{{17}{2011}{{Hogan et~al.}}{{Hogan, Harth, Umbrich, Kinsella, Polleres, and Decker}}}
\bibcite{DBLP:conf/semweb/HalpinHMMT10}{{18}{2010}{{Halpin et~al.}}{{Halpin, Hayes, McCusker, McGuinness, and Thompson}}}
\bibcite{DBLP:conf/semweb/HuS10}{{19}{2010}{{Hu and Svensson}}{{}}}
\bibcite{DBLP:conf/semweb/MillardGSS10}{{20}{2010}{{Millard et~al.}}{{Millard, Glaser, Salvadores, and Shadbolt}}}
\bibcite{DBLP:conf/rr/Hogan11}{{21}{2011}{{Hogan}}{{}}}
\bibcite{DBLP:conf/aaaiss/JainHYVS10}{{22}{2010}{{Jain et~al.}}{{Jain, Hitzler, Yeh, Verma, and Sheth}}}
\bibcite{DBLP:journals/ws/HoganUHCPD12}{{23}{2012}{{Hogan et~al.}}{{Hogan, Umbrich, Harth, Cyganiak, Polleres, and Decker}}}
\bibcite{DBLP:conf/aaaiss/TummarelloD10}{{24}{2010}{{Tummarello and Delbru}}{{}}}
\bibcite{DBLP:conf/webdb/AraujoTDHS12}{{25}{2012}{{Ara{\'u}jo et~al.}}{{Ara{\'u}jo, Tran, DeVries, Hidders, and Schwabe}}}
\bibcite{DBLP:conf/semweb/EuzenatFHHMNRSSSST11}{{26}{2011{}}{{Euzenat et~al.}}{{Euzenat, Ferrara, van Hage, Hollink, Meilicke, Nikolov, Ritze, Scharffe, Shvaiko, Stuckenschmidt, Sv{\'a}b-Zamazal, and dos Santos}}}
\bibcite{MichelsonK06}{{27}{2006}{{Michelson and Knoblock}}{{}}}
\bibcite{DBLP:conf/webdb/IseleJB11}{{28}{2011}{{Isele et~al.}}{{Isele, Jentzsch, and Bizer}}}
\bibcite{DBLP:conf/wsdm/PapadakisINPN12}{{29}{2012}{{Papadakis et~al.}}{{Papadakis, Ioannou, Nieder{\'e}e, Palpanas, and Nejdl}}}
\bibcite{fellegi_theory_1969}{{30}{1969}{{Fellegi and Sunter}}{{}}}
\bibcite{DBLP:conf/www/VolzBGK09}{{31}{2009{}}{{Volz et~al.}}{{Volz, Bizer, Gaedke, and Kobilarov}}}
\bibcite{DBLP:conf/semweb/HartigBF09}{{32}{2009}{{Hartig et~al.}}{{Hartig, Bizer, and Freytag}}}
\bibcite{DBLP:series/sci/GorlitzS11}{{33}{2011{}}{{G{\"o}rlitz and Staab}}{{}}}
\bibcite{DBLP:conf/semweb/SchwarteHHSS11}{{34}{2011}{{Schwarte et~al.}}{{Schwarte, Haase, Hose, Schenkel, and Schmidt}}}
\bibcite{hu_bootstrapping_2011}{{35}{2011{}}{{Hu et~al.}}{{Hu, Qu, and Sun}}}
\bibcite{nikolov08}{{36}{2008}{{Nikolov et~al.}}{{Nikolov, Uren, Motta, and Roeck}}}
\bibcite{DBLP:journals/pvldb/SuchanekAS11}{{37}{2011}{{Suchanek et~al.}}{{Suchanek, Abiteboul, and Senellart}}}
\bibcite{DBLP:conf/semweb/SongH11}{{38}{2011{}}{{Song and Heflin}}{{}}}
\bibcite{DBLP:conf/semweb/RongNXWYY12}{{39}{2012}{{Rong et~al.}}{{Rong, Niu, Xiang, Wang, Yang, and Yu}}}
\bibcite{DBLP:conf/semweb/SchultzMIBB11}{{40}{2011}{{Schultz et~al.}}{{Schultz, Matteini, Isele, Bizer, and Becker}}}
\bibcite{DBLP:journals/pvldb/IseleB12}{{41}{2012}{{Isele and Bizer}}{{}}}
\bibcite{DBLP:conf/www/AlexanderCHZ09}{{42}{2009}{{Alexander et~al.}}{{Alexander, Cyganiak, Hausenblas, and Zhao}}}
\bibcite{DBLP:conf/ecai/EuzenatV04}{{43}{2004}{{Euzenat and Valtchev}}{{}}}
\bibcite{DBLP:conf/iceis/LemeCBF09}{{44}{2009}{{Leme et~al.}}{{Leme, Casanova, Breitman, and Furtado}}}
\bibcite{DBLP:conf/semweb/NiuRZW11}{{45}{2011}{{Niu et~al.}}{{Niu, Rong, Zhang, and Wang}}}
\bibcite{Euzenat10}{{46}{2010}{{{Euzenat} et~al.}}{{{Euzenat}, {Ferrara}, {Meilicke}, {Nikolov}, {Pane}, {Scharffe}, {Shvaiko}, {Stuckenschmidt}, {Sváb-Zamazal}, {Svátek}, and {Trojahn dos Santos}}}}
\bibcite{DBLP:journals/pvldb/WangLYF11}{{47}{2011}{{Wang et~al.}}{{Wang, Li, Yu, and Feng}}}
\bibcite{hernandez_merge/purge_1995}{{48}{1995}{{Hern{\'a}ndez and Stolfo}}{{}}}
\bibcite{mccallum_efficient_2000}{{49}{2000}{{McCallum et~al.}}{{McCallum, Nigam, and Ungar}}}
\bibcite{papadakis_efficient_2011}{{50}{2011}{{Papadakis and Nejdl}}{{}}}
\bibcite{DBLP:journals/pvldb/ArasuCK09}{{51}{2009}{{Arasu et~al.}}{{Arasu, Chaudhuri, and Kaushik}}}
\bibcite{Song:2011:AGD:2063016.2063058}{{52}{2011{}}{{Song and Heflin}}{{}}}
\bibcite{typifier}{{53}{2013}{{Ma and Tran}}{{}}}
\bibcite{DBLP:journals/eor/AlidaeeGKW07}{{54}{2007}{{Alidaee et~al.}}{{Alidaee, Glover, Kochenberger, and Wang}}}
\bibcite{tversky1977features}{{55}{1977}{{Tversky}}{{}}}
\bibcite{DBLP:conf/vldb/ChaudhuriCGK07}{{56}{2007}{{Chaudhuri et~al.}}{{Chaudhuri, Chen, Ganti, and Kaushik}}}
\bibcite{chauvenet}{{57}{1960}{{Chauvenet}}{{}}}
\bibcite{DBLP:conf/www/HuCQ11}{{58}{2011{}}{{Hu et~al.}}{{Hu, Chen, and Qu}}}
\bibcite{melnik_similarity_2002}{{59}{2002}{{Melnik et~al.}}{{Melnik, Garcia-Molina, and Rahm}}}
\bibcite{bernstein_discovering_2009}{{60}{2009{}}{{Volz et~al.}}{{Volz, Bizer, Gaedke, and Kobilarov}}}
\bibcite{DBLP:conf/ijcai/CohenRF03}{{61}{2003}{{Cohen et~al.}}{{Cohen, Ravikumar, and Fienberg}}}
\bibcite{budanitsky_evaluating_2006}{{62}{2006}{{Budanitsky and Hirst}}{{}}}
\bibcite{han_structural_2010}{{63}{2010}{{Han and Zhao}}{{}}}
\bibcite{DBLP:conf/esws/NikolovdM12}{{64}{2012}{{Nikolov et~al.}}{{Nikolov, d'Aquin, and Motta}}}
\bibcite{DBLP:conf/semweb/WangZHZLQT10}{{65}{2010}{{Wang et~al.}}{{Wang, Zhang, Hou, Zhao, Li, Qi, and Tang}}}
\bibcite{DBLP:conf/cikm/BohmMNW12}{{66}{2012}{{B{\"o}hm et~al.}}{{B{\"o}hm, de~Melo, Naumann, and Weikum}}}
\bibcite{DBLP:conf/www/JaffriGM08}{{67}{2008}{{Jaffri et~al.}}{{Jaffri, Glaser, and Millard}}}
\bibcite{DBLP:journals/ijswis/FerraraNS11}{{68}{2011}{{Ferrara et~al.}}{{Ferrara, Nikolov, and Scharffe}}}
\bibcite{MaurouxHJAM09}{{69}{2009}{{Cudr{\'e}-Mauroux et~al.}}{{Cudr{\'e}-Mauroux, Haghani, Jost, Aberer, and de~Meer}}}
\bibcite{DBLP:series/synthesis/2011Gal}{{70}{2011}{{Gal}}{{}}}
\bibcite{DBLP:conf/rweb/Parsia06}{{71}{2006}{{Parsia}}{{}}}
\bibcite{DBLP:conf/icde/LabordaC06}{{72}{2006}{{de~Laborda and Conrad}}{{}}}
\bibcite{DBLP:conf/esws/DietzoldA07}{{73}{2007}{{Dietzold and Auer}}{{}}}
\bibcite{DBLP:conf/aswc/CornoCCV08}{{74}{2008}{{Corno et~al.}}{{Corno, Corcoglioniti, Celino, and Valle}}}
\bibcite{DBLP:conf/semweb/GorlitzS11}{{75}{2011{}}{{G{\"o}rlitz and Staab}}{{}}}
\bibcite{DBLP:conf/semweb/MontoyaVCRA12}{{76}{2012}{{Montoya et~al.}}{{Montoya, Vidal, Corcho, Ruckhaus, and Aranda}}}
\bibcite{DBLP:conf/wsdm/PapadakisINF11}{{77}{2011}{{Papadakis et~al.}}{{Papadakis, Ioannou, Nieder{\'e}e, and Fankhauser}}}
\bibcite{DBLP:books/daglib/0023820}{{78}{2010}{{Russell and Norvig}}{{}}}
\bibcite{DBLP:journals/tods/PerezAG09}{{79}{2009}{{P{\'e}rez et~al.}}{{P{\'e}rez, Arenas, and Gutierrez}}}
\bibcite{DBLP:conf/soda/CarrDKM00}{{80}{2000}{{Carr et~al.}}{{Carr, Doddi, Konjevod, and Marathe}}}
\bibcite{DBLP:books/mk/WittenF99}{{81}{1999}{{Witten and Frank}}{{}}}
\bibcite{DBLP:conf/nips/NgJ01}{{82}{2001}{{Ng and Jordan}}{{}}}
\bibcite{INSR:INSR385}{{83}{2001}{{Hand and Yu}}{{}}}
\bibcite{DBLP:journals/jods/EuzenatMSSS11}{{84}{2011{}}{{Euzenat et~al.}}{{Euzenat, Meilicke, Stuckenschmidt, Shvaiko, and dos Santos}}}
\bibcite{serimi}{{85}{2012}{{Araujo et~al.}}{{Araujo, Tran, de~Vries, Hidders, and Schwabe}}}
\bibcite{DBLP:conf/semweb/HuCCQ10}{{86}{2010}{{Hu et~al.}}{{Hu, Chen, Cheng, and Qu}}}
\bibcite{DBLP:journals/tkde/LiTLL09}{{87}{2009}{{Li et~al.}}{{Li, Tang, Li, and Luo}}}
\bibcite{DBLP:journals/jair/BhattacharyaG07}{{88}{2007}{{Bhattacharya and Getoor}}{{}}}
\bibcite{DBLP:journals/pvldb/MetwallyF12}{{89}{2012}{{Metwally and Faloutsos}}{{}}}
\bibcite{DBLP:conf/www/HerzigT12}{{90}{2012}{{Herzig and Tran}}{{}}}
\bibcite{DBLP:journals/expert/Fayyad96}{{91}{1996}{{Fayyad}}{{}}}
\bibcite{DBLP:journals/debu/RahmD00}{{92}{2000}{{Rahm and Do}}{{}}}
\bibcite{DBLP:conf/popl/Gulwani11}{{93}{2011}{{Gulwani}}{{}}}
\bibcite{DBLP:journals/cacm/GulwaniHS12}{{94}{2012}{{Gulwani et~al.}}{{Gulwani, Harris, and Singh}}}
\bibcite{DBLP:journals/aim/Lau09}{{95}{2009}{{Lau}}{{}}}
\bibcite{DBLP:conf/icai/MichelsonK09}{{96}{2009}{{Michelson and Knoblock}}{{}}}
\bibcite{DBLP:conf/emnlp/OkazakiTAT08}{{97}{2008}{{Okazaki et~al.}}{{Okazaki, Tsuruoka, Ananiadou, and ichi Tsujii}}}
\bibcite{levelshtein-66-binary}{{98}{1966}{{Levenshtein}}{{}}}
\bibcite{2009design}{{99}{2009}{{200}}{{}}}
\bibcite{DBLP:books/daglib/0023376}{{100}{2009}{{Cormen et~al.}}{{Cormen, Leiserson, Rivest, and Stein}}}
\bibcite{DBLP:books/cu/Gusfield1997}{{101}{1997}{{Gusfield}}{{}}}
\bibcite{DBLP:books/daglib/0019552}{{102}{2006}{{Linz}}{{}}}
\bibcite{Ziegler:2005:IRL:1060745.1060754}{{103}{2005}{{Ziegler et~al.}}{{Ziegler, McNee, Konstan, and Lausen}}}
\bibcite{DBLP:conf/uai/ChengG99}{{104}{1999}{{Cheng and Greiner}}{{}}}
\bibcite{1183917}{{105}{2002}{{Molina et~al.}}{{Molina, Belanche, and Nebot}}}
\bibcite{DBLP:journals/aai/RatanamahatanaG03}{{106}{2003}{{Ratanamahatana and Gunopulos}}{{}}}
\bibcite{DBLP:conf/dexa/PatroW11}{{107}{2011}{{Patro and Wang}}{{}}}
\bibcite{DBLP:conf/kdd/TejadaKM02}{{108}{2002}{{Tejada et~al.}}{{Tejada, Knoblock, and Minton}}}
\bibcite{Bouchard04thetrade-off}{{109}{2004}{{Bouchard and Triggs}}{{}}}
\bibcite{DBLP:journals/pvldb/SinghG12}{{110}{2012}{{Singh and Gulwani}}{{}}}
\bibcite{DBLP:conf/aaai/WuSK12}{{111}{2012}{{Wu et~al.}}{{Wu, Szekely, and Knoblock}}}
\bibcite{conf/acl/SattaH97}{{112}{1997}{{Satta and Henderson}}{{}}}
\bibcite{DBLP:conf/vldb/RamanH01}{{113}{2001}{{Raman and Hellerstein}}{{}}}
\bibcite{trec-kba-overview-2012}{{114}{2012}{{Frank et~al.}}{{Frank, Kleiman-Weiner, Roberts, Niu, Zhang, Re, and Soboroff}}}
\bibcite{DBLP:conf/semweb/AuerBKLCI07}{{115}{2007}{{Auer et~al.}}{{Auer, Bizer, Kobilarov, Lehmann, Cyganiak, and Ives}}}
\bibcite{DBLP:journals/ws/BizerLKABCH09}{{116}{2009{}}{{Bizer et~al.}}{{Bizer, Lehmann, Kobilarov, Auer, Becker, Cyganiak, and Hellmann}}}
\bibcite{DBLP:conf/esws/KobilarovSROSSBL09}{{117}{2009}{{Kobilarov et~al.}}{{Kobilarov, Scott, Raimond, Oliver, Sizemore, Smethurst, Bizer, and Lee}}}
\@writefile{toc}{\contentsline {chapter}{SIKS Dissertations}{147}{appendix*.615}}
\@writefile{lof}{\addvspace {10\p@ }}
\@writefile{lot}{\addvspace {10\p@ }}
